# 存储一级标题
first_level = [
    {
        "pattern":r'^第[一二三四五六七八九十]+[章节条]',
        "pdf_type":'募集说明书'
    }
]

# 存储有规则标题的正则匹配规则
rules_regex = [
    # {
    #     "pattern": r"^第[一二三四五六七八九十]+章",
    #     "sample": "第一章 释义"
    # },
    # {
    #     "pattern": r"^第[一二三四五六七八九十]+节",
    #     "sample": "第三节 发行人及本期债券的资信状况"
    # },
    # {
    #     "pattern": r"^第[一二三四五六七八九十]+条",
    #     "sample": "第一条 风险提示及说明"
    # },
    {
        "pattern": r"^[一二三四五六七八九十]+、",
        "sample": "一、发行人主体提示"
    },
    {
        "pattern": r"^[(（][一二三四五六七八九十]+[)）]",
        "sample": "（一）核心风险提示"
    },
    {
        "pattern": r"^\d+、",
        "sample": "1、原材料价格波动风险"
    },
    {
        "pattern": r"^[(（]\d+[)）]",
        "sample": "（1）证券业务"
    },
    {
        "pattern": r"^\d+[)）]",
        "sample": "2）资本公积"
    },
    {
        "pattern": r"^\d+\.[^\.\d]",
        "sample": "1.董事会"
    },
    {
        "pattern": r"^\d+\.\d+[^\.]",
        "sample": "1.1董事会"
    },
    {
        "pattern": r"^\d+\.\d+\.\d+[^\.]",
        "sample": "1.1.1董事会"
    },
    {
        "pattern": r"^\d+\.\d+\.\d+\.\d+[^\.]",
        "sample": "1.1.1.1董事会"
    },
    {
        "pattern": r"^[a-z]、",
        "sample": "c、管理人决策会"
    },
    {
        "pattern": r"^[A-z][、\. ]",
        "sample": "A、管理人决策会 A.管理人决策会 A 管理人决策会"
    },
    {
        "pattern": r"^[①②③④⑤⑥⑦⑧⑨⑩]",
        "sample": "①"
    }
]
rules_regex = first_level + rules_regex
# 存储无规则标题的匹配规则
no_rules_regex = [{
        "pattern": r"附表[一二三四五六七八九十]+：",
        "sample": "附表一："
    },]